\relax 
\emailauthor{s.f.cardosodearaujo@tudelft.nl}{Samur Araujo}
\emailauthor{a.p.devries@tudelft.nl}{Arjen de Vries}
\citation{DBLP:conf/popl/Gulwani11}
\citation{DBLP:journals/cacm/GulwaniHS12}
\citation{DBLP:journals/cacm/GulwaniHS12}
\citation{DBLP:journals/aim/Lau09}
\citation{DBLP:journals/pvldb/ArasuCK09}
\citation{DBLP:conf/icai/MichelsonK09}
\@writefile{toc}{\contentsline {section}{\numberline {1}Introduction}{1}}
\citation{DBLP:conf/emnlp/OkazakiTAT08}
\@writefile{lot}{\contentsline {table}{\numberline {1}{\ignorespaces Examples of String Transformations}}{2}}
\newlabel{table:ruleexamples}{{1}{2}}
\@writefile{toc}{\contentsline {subsection}{\numberline {1.1}Overview and Contributions}{2}}
\citation{levelshtein-66-binary}
\@writefile{toc}{\contentsline {section}{\numberline {2}Learning Transformations}{3}}
\newlabel{sec:problem}{{2}{3}}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.1}Preliminary Definitions}{3}}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.2}Transformation Rules}{4}}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.3}Generalization of Transformation Rules}{4}}
\@writefile{toc}{\contentsline {subsection}{\numberline {2.4}Learning Problem}{5}}
\@writefile{toc}{\contentsline {section}{\numberline {3}Rule Learner Algorithm}{5}}
\newlabel{sec:algorithm}{{3}{5}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.1}Rule Learning}{6}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.2}Relative Position Algorithm}{6}}
\@writefile{lof}{\contentsline {figure}{\numberline {1}{\ignorespaces String $u=``Noia, La"$, $u^c=\textbf  {zulllpsulz}$, $E_2(u^c)=\{\textbf  {zu, ul, ll, ll, lp, ps, su, ul, lz}\}$, $w_{e_1}=\textbf  {zulllpsu}$ and $w_{e_9}=\textbf  {ulz}$.}}{6}}
\newlabel{fig:diagram}{{1}{6}}
\newlabel{eq:relative}{{3}{6}}
\newlabel{eq:fremean}{{4}{6}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {1}{\ignorespaces RelativePosition($u$, $i$, $n$).}}{6}}
\newlabel{alg:relativeposition}{{1}{6}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.3}Permutation Rule Learner}{6}}
\citation{2009design}
\newlabel{eq:permutation}{{6}{7}}
\newlabel{lemma:ss}{{1}{7}}
\@writefile{loa}{\contentsline {algorithm}{\numberline {2}{\ignorespaces Sorting($t_c$, $v$).}}{7}}
\newlabel{alg:ss}{{2}{7}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.4}Insertions and Deletions Rule Learner}{7}}
\@writefile{lof}{\contentsline {figure}{\numberline {2}{\ignorespaces All common substrings between $u_p = ``Aug\ 06,\ 2013"$ and $v = ``06/08/13"$.}}{8}}
\newlabel{fig:permutation}{{2}{8}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.5}Update Rule Learner }{8}}
\@writefile{toc}{\contentsline {subsection}{\numberline {3.6}Discussion}{8}}
\@writefile{toc}{\contentsline {section}{\numberline {4}Rule Selector Method}{8}}
\newlabel{sec:rulelearner}{{4}{8}}
\citation{Ziegler:2005:IRL:1060745.1060754}
\@writefile{toc}{\contentsline {section}{\numberline {5}Evaluation}{9}}
\newlabel{sec:evaluations}{{5}{9}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.1}Data}{9}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.2}Evaluation Metric }{10}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.3}Rule Coverage}{10}}
\@writefile{lot}{\contentsline {table}{\numberline {2}{\ignorespaces  Maximal Coverage Per Task }}{10}}
\newlabel{table:rulecoverage}{{2}{10}}
\@writefile{lot}{\contentsline {table}{\numberline {3}{\ignorespaces  The first 7 rules with the highest coverage for the Abbreviations dataset using $E_2$. }}{10}}
\newlabel{table:coverageabbreviations}{{3}{10}}
\@writefile{lot}{\contentsline {table}{\numberline {4}{\ignorespaces  The first 11 rules with the highest coverage for the Books dataset using $E_2$. }}{10}}
\newlabel{table:coveragebooks}{{4}{10}}
\citation{1183917}
\citation{DBLP:conf/popl/Gulwani11,DBLP:journals/cacm/GulwaniHS12}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.4}Rule Selector Accuracy}{11}}
\@writefile{lot}{\contentsline {table}{\numberline {5}{\ignorespaces Abbreviations Examples}}{11}}
\newlabel{table:abbreviationsexamples}{{5}{11}}
\@writefile{lot}{\contentsline {table}{\numberline {6}{\ignorespaces Book Titles Examples}}{11}}
\newlabel{table:bookexamples}{{6}{11}}
\@writefile{lot}{\contentsline {table}{\numberline {7}{\ignorespaces Song Examples}}{11}}
\newlabel{table:songexamples}{{7}{11}}
\@writefile{lot}{\contentsline {table}{\numberline {8}{\ignorespaces Dates Examples}}{11}}
\newlabel{table:datesexamples}{{8}{11}}
\@writefile{lot}{\contentsline {table}{\numberline {9}{\ignorespaces Accuracy of the Rule Algorithm With $E_2$}}{11}}
\newlabel{table:results}{{9}{11}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.5}Runtime Cost}{11}}
\@writefile{toc}{\contentsline {subsection}{\numberline {5.6}Performance Comparison}{11}}
\citation{DBLP:journals/pvldb/ArasuCK09}
\citation{DBLP:conf/icai/MichelsonK09}
\citation{DBLP:conf/dexa/PatroW11}
\citation{DBLP:conf/kdd/TejadaKM02}
\@writefile{lof}{\contentsline {figure}{\numberline {3}{\ignorespaces Learning time varying the sample size for the Books dataset. We considered 4 runs for each sample size.}}{12}}
\newlabel{fig:time}{{3}{12}}
\@writefile{lot}{\contentsline {table}{\numberline {10}{\ignorespaces Average accuracy per systems.}}{12}}
\newlabel{table:comparisonflashfill}{{10}{12}}
\@writefile{toc}{\contentsline {section}{\numberline {6}Related Work}{12}}
\newlabel{sec:relatedwork}{{6}{12}}
\citation{DBLP:conf/emnlp/OkazakiTAT08}
\citation{DBLP:conf/popl/Gulwani11}
\citation{DBLP:journals/pvldb/SinghG12}
\citation{DBLP:conf/aaai/WuSK12}
\citation{conf/acl/SattaH97}
\citation{DBLP:conf/vldb/RamanH01}
\bibstyle{model1-num-names}
\bibdata{../paper}
\bibcite{DBLP:conf/popl/Gulwani11}{{1}{2011}{{Gulwani}}{{}}}
\bibcite{DBLP:journals/cacm/GulwaniHS12}{{2}{2012}{{Gulwani et~al.}}{{Gulwani, Harris, and Singh}}}
\bibcite{DBLP:journals/aim/Lau09}{{3}{2009}{{Lau}}{{}}}
\bibcite{DBLP:journals/pvldb/ArasuCK09}{{4}{2009}{{Arasu et~al.}}{{Arasu, Chaudhuri, and Kaushik}}}
\bibcite{DBLP:conf/icai/MichelsonK09}{{5}{2009}{{Michelson and Knoblock}}{{}}}
\bibcite{DBLP:conf/emnlp/OkazakiTAT08}{{6}{2008}{{Okazaki et~al.}}{{Okazaki, Tsuruoka, Ananiadou, and ichi Tsujii}}}
\bibcite{levelshtein-66-binary}{{7}{1966}{{Levenshtein}}{{}}}
\bibcite{2009design}{{8}{2009}{{200}}{{}}}
\bibcite{Ziegler:2005:IRL:1060745.1060754}{{9}{2005}{{Ziegler et~al.}}{{Ziegler, McNee, Konstan, and Lausen}}}
\bibcite{1183917}{{10}{2002}{{Molina et~al.}}{{Molina, Belanche, and Nebot}}}
\bibcite{DBLP:conf/dexa/PatroW11}{{11}{2011}{{Patro and Wang}}{{}}}
\bibcite{DBLP:conf/kdd/TejadaKM02}{{12}{2002}{{Tejada et~al.}}{{Tejada, Knoblock, and Minton}}}
\bibcite{DBLP:journals/pvldb/SinghG12}{{13}{2012}{{Singh and Gulwani}}{{}}}
\bibcite{DBLP:conf/aaai/WuSK12}{{14}{2012}{{Wu et~al.}}{{Wu, Szekely, and Knoblock}}}
\bibcite{conf/acl/SattaH97}{{15}{1997}{{Satta and Henderson}}{{}}}
\bibcite{DBLP:conf/vldb/RamanH01}{{16}{2001}{{Raman and Hellerstein}}{{}}}
\@writefile{toc}{\contentsline {section}{\numberline {7}Conclusions}{13}}
